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FIG. 1A 

GAATTCGCGTCGAATCATTGTCTGTTCGGTATCGATTCAGAAACCGAAACTTGTGATCGA 

TAACAAGTCATTCAAACACGGCGAAGATGTCTATGCGTATAACAGAATATTTGGAGAAAT ^ EC E I VE D 

61 + -- + + + + + 120 

GCTCGCAAAACTCGAAATTGTCACCGATAAAATGATTAACTTGAAGGGGCTAATGTAAGT _ _ _ m 

i2i + + .- + + + + 18( ^PR 1 5 2003 

TATCTGATGTTTCTACAATTAAAAAAATTGTTTTTTTTTCCAAATTAATTTTCGAAGATT 

AACGAAAAACGATTAAAAATCAATAAAACGCAATAAAGAGGGCT 1 600/2900 

241 -_- + .__ + + + + + 3 00 

TTAAATTATAATTTTTCTGATTGTTGTATGAAGCTACAAAATGTACTGTTTTTGTATTTG 
301 + + + -- + + + 360 

AATATTGTATTACAGGGTTGGGATTCTCGGCAAATATCAGCGACAGTGGAAGATTTAGAA 
361 + + + + + + 420 

GAAGGACGTGTGACAATCACTAAGTCAAAGAGGGAAAGGATAAAGGATTGTGATATTTCA 
421 + + + + + + 4 8 o 

CTGTTTTACTCATTCGCTTTTTAAATAAGAACTATATGCCGATTTGCCGATATATTTTTG 
481 --- - + + + -- - + + -- --+ 540 

TTTATTAGGCCTCTCACATTCCTGTACAATGTTTCTACCAAATAAACTGCATTTTTATCT 
541 + + + + + + 60 0 

GAAAATTCGAATTTATTTTTGTCTACTTTTTACTCGTTGCATTCGAGATCAGCATATCTT 
601 + + -- -- + - --- + + - ---+ 660 

CCGGTCTATTTATATTCAACGATTTTTATAAATTAGTACTCCTTCATGTTTAATTTCATT 
661 + + + + + + 720 

TTATCTGTAAGCTTTACTGTATTTTTTTAAAATCTTTCTTGCTTCTATCTGATTATACAA 
721 + + + + + + 730 

TGTTCTTTACTCATTTTCAAGGTATTTTTATGCCTCACAATTTATGCACATTTCGGGCTT 
781 + + + + + + 840 

GGAGATTTATCCTCTATATTACATGCCTGTTTTTTTAAAGGATATAATGTTTAACAAATA 
841 + + + + + + 900 

ATTTTTTATCAATGPTATTGTATATTCTCCAGCTAACCGTTGTTTCGAAAACATCACCTA 
901 --- + + + + + . + 96 o 

GCATTTTAAAATTCACAAAATCTTGCTTCCTTATAATCAAGAAGATTTTTCAGATGCTCT 
961 + + + + + + 1020 

M L C 

1 u 

GCGAAATCGAATGCCGCGCTTTGAGCACGGCACACACGAGGCTCATCCACGACTTTGAAC 
1021 + + + + + + 1080 

EIECRALSTAHTRLIHDFEP 

10 20 

T nll62 
t 

CACGTGACGCATTGACTTATTTAGAAGGCAAAAACATTTTCACAGAAGATCATTCTGAAC 
1081 + + + + + + H40 

RDALTYLEGKNIFTEDHSEL 

30 40 

TTATCAGTAAAATGTCAACTCGCCTCGAGAGGATCGCCAATTTTCTTCGAATCTATCGAC 
1141 + + •+ + + + 120Q 

ISKMSTRLERIANFLRIYRR 
50 60 
GTCAAGCTTCTGAACTTGGACCACTCATCGACTTTTTCAACTACAACAATCAAAGTCACC 
1201 + + + + + + 1260 

QASELGPLIDFFNYNNQSHL 

70 80 
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FIG. 1B 

TTGCTGATTTCCTCGAAGACTACATCGATTTTGCGATAAATGAGCCAGATCTACTTCGTC 

1261 + + + + + + 1320 

ADFLEDYIDFAINEPDLLRP 

90 100 
CAGTAGTGATTGCTCCACAATTTTCCCGACAAATGCTCGATAGGAAACTATTGCTTGGGA 

13 21 + + + + + + 1380 

VVIAPQFSRQMLDRKLLLGN 
110 120 

T n2274 Q 

t Ui 

ATGTTCCAAAACAAATGACATGCTATATTCGAGAGTATCACGTGGATCGAGTGATCAAAA ^ 

i38i + + + + + + i«or» 

VPKQMTCYI REYHVDRVIKK ^ 
130 140 KJ 7* 

v I Intron 1 Uj §f 

AGCTCGACGAGATGTGTGATTTAGGTGAGAAAACTGGAAGCTCTCGTGTTTATTATAATC Q£ «Z 

1441 + + — - + + + + 1500 

LDEMCDLD 
I 150 

TTGCTTAAACTTCAGkcTCCTTTTTTCTGTTTCTACACGGCCGAGCTGGATCCGGAAAAT 

1501 + + + + + + 1560 

SFFLFLHGRAGSGKS 

160 

I Intron 2 

CAGTAATTGCATCACAAGCTCTTTCGAAATCTGACCAACTTATTGGAATGTGAGTGGTAT 

1561 + + + + + + I 620 

VIASQALSKSDQLIGI 
170 I 180 

TATCTGAATCTACGGATCTTCATTCTATTACAGRAATTATGATTCAATCGTTTGGCTCAA 

1621 + + + ---' + + + 1680 

NYDSIVWLK 

190 

AGATAGTGGAACAGCTCCAAAATCTACATTCGATTTATTTACGGATATTTTGCTGATGCT 
1681 + + + + + + 1740 

DSGTAPKSTFDLFTDILLML 

200 210 

A nl920/n2247 
If Intron 3 

AAAGTGAGTGAATAGAGTGCATGTAACATTCAGCATGATTTTGAAATTATGAAAATTTGA 

1741 --J + + + - + + + 1800 

K 

CCTGGTTAGCTTTTAATTTGATATTTCGTGACGCTTGCATGTTTTGTGTGTTTGAAGACG 

1801 + + + - + -- -- + + I860 

AGCCCGTGTTGTGAGCGACACGGATGACTCGCATTCGATCACCGACTTCATTAACCGTGT 

1861 + + + -- -- + + + 1920 

A 1X2273 



tctttcaagUagcgaagacgatcttctcaatttcccatcggtggagcatgtcacgtcagt 

1921 -- -- + + -- -- + + + + 1980 

SEDDLLNFPSVEHVTSV 

220 
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FIG. 1C 

| Intron 4 

TGTACTCAAAAGGATqGTAAGTTGCTTGCCGATTCTGGTACAATATCTTAAATTATTGGT 

1 981 + J--- + + + + + 2040 

V L K R M 

230 | 

ttttagIatctgcaacgcactcattgatcgtccaaatactttattcgtatttgatgacgta 

2041 J--- + + + + + + 2100 

ICNALIDRPNTLFVFDDV Q 

240 250 qj 

A nl948 T nl947 ^ 

gttcaagaagaaacaattcgttgggctcaggagctacgtcttcgatgtcttgtaactact LLJ 

2101 + + + + + + 216CQ - 

VQEETI RWAQELRLRCLVTT |JJ £ 

260 270 £f* <t 

CGTGACGTGGAAATATCAAATGCTGCTTCTCAAACATGCGAATTCATTGAAGTGACATCA 

2161 + + + + + + 2220 

RDVEISNAASQTCEFIEVTS 

280 290 
TTGGAAATCGATGAATGTTATGATTTTCTAGAAGCTTATGGAATGCCGATGCCTGTTGGA 
2221 + + + + + + 2280 

LEIDECYDFLEAYGMPMPVG 

300 310 
Tc4 nl416 
I 

GAAAAAGAAGAAGATGTGCTTAATAAAACAATCGAACTAAGCAGTGGAAATCCAGCAACG 
2281 + + + + + + 2340 

EKEEDVLNKTIELS SGNPAT 

320 330 

ilntron 5 

CTTATGATGTTTTTCAAGTCTTGTGAACCGAAAACATTTGAAAAGTTGAGTGGGACATACC 

2341 + + + + + + 2400 

LMMFFKSCEPKTFEK 

330 

AATTTGAGACTTTTAAAATAATTTATTCTACAATAAAAGTTAATCAAAAAGTTTCATAGC 

2401 + + + + + + 2460 

TGATTGTCTTTAAATTTTACGAATTGAGGATCAAAATCAAGAATTAGGATCCTGGCACGA 

2461 + + + + + + 2520 

GAGAAAACTGTGTAGCTACCGTACCCGAGAGATTTTCTTGATATTTGCCATCGATTTAAT 

2520 + + + + + + 2580 

TTTTTAAGAAAATTATCGTTTTACATAATTGAACAAGAGATACACGGTCTCGACCCGACG 

2581 + + + + + + 2640 

GAAATTTTTTAAATGAAAGCGAGTATGAGCCTGTTTTCATTATTTTTCGATTTTCTCTTG 

2641 + + + + + + 2700 

TTGTTTCTTTTTATTTAAAGCCTTTTATTTTGAAACAAGTCTAAAAATATTAAAAACTGA 

2701 + + + + + + 2760 

ATAAAATATTTAAAAAAAATCAAGTAAAATAGAAAAACAGCAAGGCTGGAGACTACTGTA 

2760 + + + + -- -- + + 2820 

CTTCTTAAATCCGCATACTCTTTTTATTTAATCATTTTCCGGAATGTCGAAACGAAATAA 

2821 - + - + + + + + 2880 

TACATTTTTAGTCCAAAATCGCTAGGTATATTCTTAAAATTATCAAACATTTTGCATTCA 



ULi 
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2881 -i + + + + + _--+ 2940 

OAATGGCACAGCTTAATAACAAATTGGAAAGTCGAGGATTAGTCGGTGTTGAATGTATCA 

2941 + + + + + - -+ 3000 

MAQLNNKLESRGLVGVECIT 
340 350 

CCCCTTACTCGTACAAGTCACTCGCAATGGCTCTTCAAAGATGTGTTGAAGTTTTGTCAG O 

3001 + + + + + + 306(UJ 

PYSYKSLAMALQRCVEVLSD > 
360 370 j"Q 

ATGAGGATCGAAGTGCTCTTGCTTTCGCAGTTGTGATGCCTCCTGGAGTTGATATACCCG 

o 

3061 + + + + + + 3 i2cM-l 

EDRSALAFAVVMPPGVDIPV CC 
380 390 
A nl894 

t 

TCAAGCTATGGTCATGTGTTATTCCAGTTGATATTTGTTCAAATGAAGAAGAACAATTGG 
3121 + + + + + + 3180 

KLWSCVIPVDICSNEEEQLD 
400 410 

| Intron 6 

ATGATGAAGTTGCGGATCGGTTGAAAAGACTCAGCAflGTATGAGTCTTGAAATTTGAAGA 
3181 + + + J.. + + + 3240 

DEVADRLKRLSK 
420 I 

TTTAAATTAACACTTAAAATTTCAGjACGTGGAGCTCTTCTCAGTGGAAAACGAATGCCCG 
3241 + + 1 + + + + 3300 

RGALLSGKRMPV 
430 440 

TTTTGACATTCAAAATTGATCATATTATCCATATGTTCTTGAAACACGTCGTTGATGCAC 
3301 + + + + + + 3360 

LTFKIDHI IHMFLKHVVDAQ 

450 460 
Intron 7 . 

aaactatcgccgtatgctgaaaatgtctcaactttcaattaaattttaaattttcagIaat 

3361 + + + + + T__ + 342Q 

T I A n 

GGAATCTCAATTCTCGAGCAGCGTCTTCTTGAAATAGGAAACAATAATGTATCAGTACCG 
3421 + + + + + + 3480 

GI SI LEQRLLEIGNNNVSVP 
470 480 

GAGCGACATATACCATCACATTTCCAAAAATTCCGTCGTTCATCAGCCAGTGAGATGTAT 
3481 + + + + + + 354Q 

E R H I PSHFQKFRRS SASEMY 
500 510 

CCAAAAACTACAGAAGAAACTGTGATCCGTCCTGAAGACTTCCCAAAGTTCATGCAATTG 
3541 + + + + + + 360Q 

PKTTEETVIRP EDFPKFMQL 
520 530 

CACCAGAAATTCTATGACTCCCTCAAAAATTTTGCATGCTGTTAAAACCTATCGTGTACA 
3601 + + -- + + + + 3660 

HQKFYDSLKNFACC* 
540 

ATATTGCCTGTATATTCCCCTCGAAATACGTTTATACTTTTTCGCACGAGTTTTCTCATT 
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3661 + + + + -- - + + 3720 

TTTTCATTTGTACTTGTTTTATTTCTCTCCAAAATTTCAGATCTATCCCAAATGTTCTTA 

3721 + + - + - - + + + 3780 

AATTTAATGTTTTCTACAGATACTCAACACATCTTGTTTCATCTCATCCTTGCTTTTTTT 

3781 + + + + + + 3840 

TTTCAAATATATTCAGTTTCTTTTATAATTTTAATTAATCGAATTAATACATTCACGTAA 

3841 + + + + -- + + 3900 

AGAATTTCGTGGACTATTATTTTATCGCATCCAAATGATTTATTCCCTATTGTTCGAAAC 

3901 + + + + + + 3960 

TTCCAAATTGATCATTTTTAAACACGCCTCATTAAATTGAAAGTCGTACTTTTAGTCTCG 

3961 + + + + + + 4020 

AACATGAAGTAAGTTATTTTCTGTGTTCTAAATTCAAAGTGCATTCCAAAAGGACATTTG 

4021 + + + - + + + 4080 

ATGAGTTTTCACGAAAACCGTAATTTTTACAATTTCCTTTCAGTTTTGAAGATGTTCGAT 

4081 + + + + + + 4140 

TTCTTTCCTCTGTTGGCGTCATTACTACATTTGCTTTGCTGCTTCACTTTATCGAGATTC 

4141 + + + + -- + + 4200 

TTGCCATCAATGGAGTTCCATCTAGACCGATAGCAGTCTTCATATCATTATCCCTGTATA 

4201 + + + + + + 4260 

TTGTACTGTTTCAGTATTTTAACTTATCGATTACGTACTATATTCAGTGGTTCACTGTTT 

4261 + + + + --- + -+ 4320 

TCGGTCAATGGGTGACACGTGCTCGACGANNAATTTTCAACGAACGCAATCTCCTAGTCA 

4320 + + + + + + 4380 

CTTATCAACCAAGAGCCCTCACCCATG 
4380 + + 4407 
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FIG. 3 
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FIG. 4A 

ced-3 Genomic Sequence 



AGATCTGAAATAAGGTGATAAATTAATAAATTAAGTGTATTTCTGAGGAAATTTGACTGT 
1 + - + + + + + 60 

TTTAGCACAATTAATCTTGTTTCAGAAAAAAAGTCCAGTTTTCTAGATTTTTCCGTCTTA 
61 + + + - + + + 120 

TTGTCGAATTAATATCCCTATTATCACTTTTTCATGCTCATCCTCGAGCGGCACGTCCTC 
121 + --- + + + -- + + 180 

AAAGAATTGTGAGAGCAAACGCGCTCCCATTGACCTCCACACTCAGCCGCCAAAACAAAC 
181 -- + + + + -- + + 240 

GTTCGAACATTCGTGTGTTGTGCTCCTTTTCCGTTATCTTGCAGTCATCTTTTGTCGTTT 
241 + + + + -- + + 300 

TTTTCTTTGTTCTTTTTGTTGAACGTGTTGCTAAGCAATTATTACATCAATTGAAGAAAA 
301 + + + + + + 360 

GGCTCGCCGATTTATTGTTGCCAGAAAGATTCTGAGATTCTCGAAGTCGATTTTATAATA 
361 + + + + + + 420 

TTTAACCTTGGTTTTTGCATTGTTTCGTTTAAAAAAACCACTGTTTATGTGAAAAACGAT 
421 + + + + + ____+ 4 8 o 

TAGTTTACTAATAAAACTACTTTTAAACCTTTACCTTTACCTCACCGCTCCGTGTTCATG 
481 + + + + + + 540 

GCTCATAGATTTTCGATACTCAAATCCAAAAATAAATTTACGAGGGCAATTAATGTGAAA 
541 + + + + + + 60Q 

CAAAAACAATCCTAAGATTTCCACATGTTTGACCTCTCCGGCACCTTCTTCCTTAGCCCC 
601 + + + + + + 660 

ACCACTCCATCACCTCTTTGGCGGTGTTCTTCGAAACCCACTTAGGAAAGCAGTGTGTAT 
661 + + + + + + 720 

CTCATTTGGTATGCTCTTTTCGATTTTATAGCTCTTTGTCGCAATTTCAATGCTTTAAAC 
721 + + + + + + 7 8 o 

AATCCAAATCGCATTATATTTGTGCATGGAGGCAAATGACGGGGTTGGAATCTTAGATGA 
781 + + + + + + 840 

GATCAGGAGCTTTCAGGGTAAACGCCCGGTTCATTTTGTACCACATTTCATCATTTTCCT 
841 + + + + + + goo 

GTCGTCCTTGGTATCCTCAACTTGTCCCGGTTTTGTTTTCGGTACACTCTTCCGTGATGC 
901 + + + + + + 960 

CACCTGTCTCCGTCTCAATTATCGTTTAGAAATGTGAACTGTCCAGATGGGTGACTCATA 
961 + + + + + + 102 o 

TTGCTGCTGCTACAATCCACTTTCTTTTCTCATCGGCAGTCTTACGAGCCCATCATAAAC 
1021 + + + + + + 1080 

TTTTTTTTCCGCGAAATTTGCAATAAACCGGCCAAAAACTTTCTCCAAATTGTTACGCAA 
1081 + --- - + + + + + i 140 

TATATACAATCCATAAGAATATCTTCTCAATGTTTATGATTTCTTCGCAGCACTTTCTCT 
1141 + + + + + + 1200 

TCGTGTGCTAACATCTTATTTTTATAATATTTCCGCTAAAATTCCGATTTTTGAGTATTA 
1201 + + + + + + 1260 



ATTTATCGTAAAATTATCATAATAGCACCGAAAACTACTAAAAATGGTAAAAGCTCCTTT 
+ + + + + + 1320^ 

' 7 

Repeat 1 ^ , *i ' 
£^ 

TAAATCGGCTCGACATTATCGTATTAAGGAATCACAAAATTCTGAGAATGCQTACTGCGC 
+ + + + + /!,-" -'-- + 1380 



AACATATTTGACGGCAAAATATCTCGTAGCGAAAACTACAGTAATTCTTTAAATGACTACy 
1381 + + + - + + - - r.i"l440 
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FIG. 4B 

Repeat 1 



> <■ 

TGTAGCGCTTGTGTCGATTTACGGGCTCAATTTTTGAAAATAATTTTTTTTTTCGAATTT 
1441 + + + + + + 1500 



TGATAACCCGTAAATCGTCACAACGCTACAGTAGTCATTTAAAGGATTACTGTAGTTCTA 
1501 + + + + + + 1560 



GCTACGAGATATTTTGCGCGCCAAATATGACTGTAATACGCATTCTCTGAATTTTGTGTT 
1561 + + + + + + 1620 

TCCGTAATAATTTCACAAGATTTTGGCATTCCACTTTAAAGGCGCACAGGATTTATTCCA 
1621 + + + + + + 1680 

ATGGGTCTCGGCACGCAAAAAGTTTGATAGACTTTTAAATTCTCCTTGCATTTTTAATTC 
1681 + + + + + + 1740 

AATTACTAAAATTTTCGTGAATTTTTCTGTTAAAATTTTTAAAATCAGTTTTCTAATATT 
1741 + + + + + --- -+ 1800 

TTCCAGGCTGACAAACAGAAACAAAAACACAACAAACATTTTAAAAATCAGTTTTCAAAT 
1801 + + + + + + I860 

TAAAAATAACGATTTCTCATTGAAAATTGTGTTTTATGTTTGCGAAAATAAAAGAGAACT 
1861 -- - + + + + + + 1920 

GATTCAAAACAATTTTAACAAAAAAAAACCCCAAAATTCGCCAGAAATCAAGATAAAAAA 
1921 + + + + + + 1980 

TTCAAGAGGGTCAAAATTTTCCGATTTTACTGACTTTCACCTTTTTTTTCGTAGTTCAGT 
1981 + + + + + - + 2040 

GCAGTTGTTGGAGTTTTTGACGAAAACTAGGAAAAAAATCGATAAAAATTACTCAAATCG 
2041 + + + + + + 2100 

AGCTGAATTTTGAGGACAATGTTTAAAAAAAAACACTATTTTTCCAATAATTTCACTCAT 
2101 + + + -- - + + + 2160 



TTTCAGACTAAATCGAAAATCAAATCGTACTCTGACTACGGGTCAGTAGAGAGGTCAACC 
2161 + + + + + + 2220 

ATCAGCCGAAGATGATGCGTCAAGATAGAAGGAGCTTGCTAGAGAGGAACATTATGATGT 

2221 + + + + -- + + 2280 

MMRQDRRSLLERNIMMF 
1 10 
T (nl040) 
I 

TCTCTAGTCATCTAAAAGTCGATGAAATTCTCGAAGTTCTCATCGCAAAACAAGTGTTGA 

2281 + --- + + -- - + - + + 2340 

S SHLKVDEI LEVLIAKQVLN 
20 30 

| Int ron 1 / 
ATAGTGATAATGGAGATATGATTAATGTGAGTTTTTAATCGAATAATAATTTTAAAAAAA • ; / 
2341 + - + + + .+ -* — + 2/400 
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FIG. 4C 



I 

AATTGATAATATAAAGAATATTTTTGCAGTCATGTGGAACGGTTCGCGAGAAGAGACGGG 

2401 + + + + + + 2460 

SCGTVREKRRE 
50 

A (n718) 
I 

AGATCGTGAAAGCAGTGCAACGACGGGGAGATGTGGCGTTCGACGCGTTTTATGATGCTC 

2461 + + + + + + 2520 

IVKAVQRRGDVAFDAFYDAL 

60 70 

| Intron 2 

TTCGCTCTACGGGACACGAAGGACTTGCTGAAGTTCTTGAACCTCTCGCCAGATCGTAGG 

2521 + + + + + + 2580 

RSTGHEGLAEVLEPLARS 
80 90 

TTTTTAAAGTTCGGCGCAAAAGCAAGGGTCTCACGGAAAAAAGAGGCGGATCGTAATTTT 

2581 + + + + + + 2 ^40 

GCAACCCACCGGCACGGTTTTTTCCTCCGAAAATCGGAAATTATGCACTTTCCCAAATAT 

2641 + + + + + + 2700 

TTGAAGTGAAATATATTTTATTTACTGAAAGCTCGAGTGATTATTTATTTTTTAACACTA 

2701 + + + - + + + 2760 

ATTTTCGTGGCGCAAAAGGCCATTTTGTAGATTTGCCGAAAATACTTGTCACACACACAC 

2761 + + + + + + 2Q20 

I 

ACACACATCTCCTTCAAATATCCCTTTTTCCAGTGTTGACTCGAATGCTGTCGAATTCGA 

2821 + + + + + + 2 880 

VDSNAVEFE 
100 

GTGTCCAATGTCACCGGCAAGCCATCGTCGGAGCCGCGCATTGAGCCCCGCCGGCTACAC 

2881 -- - + + + + + + 2 940 

CPMSPASHRRSRALSPAGYT 

110 120 

TTCACCGACCCGAGTTCACCGTGACAGCGTCTCTTCAGTGTCATCATTCACTTCTTATCA 

2941 + + + - - + + + 3000 

SPTRVHRDSVSSVSSFTSYQ 

130 140 

GGATATCTACTCAAGAGCAAGATCTCGTTCTCGATCGCGTGCACTTCATTCATCGGATCG 

3001 + + -- - + + + + 3060 

DIYSRARSRSRSRALHSSDR 

150 160 

■ ... '*> 

I intron 3 

acacaattattcatctcctccagtcaacgcatttcccagccaaccttgtatgttgatgcgJ 

3061 - + + + + -- : + --- -V 3120 

HNY S S P PVNA F P S Q P S' . 

17 0 ~ 



Title: CLONING, SEQUENCING, AND CHARACTERIZATION N 
«\, OF TWO CELL DEATH GENES AND USES THEREFOR 

%Y Applicant(s): H. Robert Horvitzetal. 

§} ■ Filing Date: May 24, 2000 Serial No.: 09/577,897 

Page 11 of 23 Customer No.: 21559 

11/23 

FIG. 4D 

Repeat 1 

AACACTAAATTCTGAGAATGCGCATTACTCAACATATTTGACGCGCAAATATCTCGTAGC 
3121 + + + + + + 3180 



GAAAAATACAGTAACCCTTTAAATGACTATTGTAGTGTCGATTTACGGGCTCGATTTTCG 
3181 + + + + + + 3240 

> 

AAACGAATATATGCTCGAATTGTGACAACGAATTTTAATTTGTCATTTTTGTGTTTTCTT 
3241 + + + + + + 3300 

Repeat 1 

< — — — — - 

TTGATATTTTTGATCAATTAATAAATTATTTCCGTAAACAGACACCAGCGCTACAGTACT 
3301 + + + + + + 3360 



CTTTTAAAGAGTTACAGTAGTTTTCGCTTCAAGATATTTTGAAAAGAATTTTAAACATTT 
3361 + + + + + + 3420 

TGAAAAAAAATCATCTAACATGTGCCAAAACGCTTTTTTCAAGTTTCGCAGATTTTTTGA 
3421 + + + + + + 3 48 o 

Repeat 2 

TTTTTTTCATTCAAGATATGCTTATTAACACATATAATTATCATTAATGTGAATTTCTTG 
3481 + + + + + + 3540 



TAGAAATTTTGGGCTTTTCGTTCTAGTATGCTCTACTTTTGAAATTGCTCAACGAAAAAA 
3541 + + + + + + 3600 

TCATGTGGTTTGTTCATATGAATGACGAAAAATAGCAATTTTTTATATATTTTCCCCTAT 
3601 + + + + + + 366Q 

TCATGTTGTGCAGAAAAATAGTAAAAAAGCGCATGCATTTTTCGACATTTTTTACATCGA 
3661 + + + + + + 3720 

> 

ACGACAGCTCACTTCACATGCTGAAGACGAGAGACGCGGAGAAATACCACACATCTTTCT 
3721 + + + + _ + + 3780 

i 

Repeat 2 /V* 

< — — — _ +r _ _ >_ ;J 

GCGTCTCTCGTCTTCAGCATGTGAAATGGGATCTCGG 
3781 + + + — - + P + 3840 



ATGTAAAAAATGCATGCGTTTTTTTACACTTTTCTGCACAAATGAATAGGGGGAAAATGT 
3841 + + + . V..^ 
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o FIG. 4E 

ATTAAAATACATTTTTTGTATTTTTCAACATCACATGATTAACCCCATTATTTTTTCGTT 
3901 + + + + + + 3960 

GAGCAACTTAAAAAGTAGAGAATATTAGAGCGAAAACCAAAATTTCTTCAAGATATTACC 
3961 + + + + + + 4020 

TTTATTGATAATTATAGATGTTAATAAGCATATCTTGAATGAAAGTCAGCAAAAATATGT 

4021 + + + + + + 4080 

GCGAAACACCTGAAAAAAATCAAAAATTCTGCGAAAATTGAAAAAATGCATTAAAATACA 

4081 + + + + + + 4140 

TTTTTGCATTTTTCTACATCACATGAATGTAGAAAATTAAAAGGGAAATCAAAATTTCTA 

4141 + + + + + + 4200 

GAGGATATAATTGAATGAAACATTGCGAAATTAAAATGTGCGAAACGTCAAAAAAGAGGA 
4201 + + + + + + 4260 

I 

AATTTGGGTATCAAAATCGATCCTAAAACCAACACATTTCAGCATCCGCCAACTCTTCAT 

4261 + + + -- -- + + + 4320 

SANSS F 
180 

TCACCGGATGCTCTTCTCTCGGATACAGTTCAAGTCGTAATCGCTCATTCAGCAAAGCTT 

4321 + + + + - -- + + 4380 

TGCSSLGYSSSRNRSFSKAS 
190 200 

CTGGACCAACTCAATACATATTCCATGAAGAGGATATGAACTTTGTCGATGCACCAACCA 

4380 + + + -- + + + 4440 

GPTQYI FHEEDMNFVDAPT I 
210 220 

TAAGCCGTGTTTTCGACGAGAAAACCATGTACAGAAACTTCTCGAGTCCTCGTGGAATGT 

4441 + + + + + + 4500 

SRVFDEKTMYRNFSSPRGMC 
230 240 

GCCTCATCATAAATAATGAACACTTTGAGCAGATGCCAACACGGAATGGTACCAAGGCCG 

4501 + + + + -- + + 4560 

LIINNEHFEQMPTRNGTKAD 
250 260 

ACAAGGACAATCTTACCAATTTGTTCAGATGCATGGGCTATACGGTTATTTGCAAGGACA 

4561 + + + _- + __,: + + 4620 

K D N L T N L F R C M G Y . V* V I C . :K, D N 

270 .. y ,'> 280 ; ; \ v 

| Intron 4 / - 7 i^l 
ATCTGACGGGAAGGGTACGGCGAAATTATATTACC^A^CGCGAAATTTGCCATTTTGCG 
4621 + + -- + --- + ^ + + 4680 

L T G R , /; 
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FIG.4F 

Repeat 3 

■ > 

CCGAAAATGTGGCGCCCGGTCTCGACACGACAATTTGTGTTAAATGCAAAAATGTATAAT 

4681 + + + + + + 4740 

TTTGCAAAAAACAAAATTTTGAACTTCCGCGAAAATGATTTACCTAGTTTCGAAATTTTC 

4741 + + + + + + 4800 

GTTTTTTCCGGCTACATTATGTGTTTTTTCTTAGTTTTTCTATAATATTTGATGTAAAAA 

4801 + + + + + + 4860 

ACCGTTTGTAAATTTTCAGACAATTTTCCGCATACAAAACTTGATAGCACGAAATCAATT 

4861 + + + + + + 4 9 20 

TTCTGAATTTTCAAAATTATCCAAAAATGCACAATTTAAAATTTGTGAAAATTGGCAAAC 

4921 + + + + + + 4980 

GGTGTTTCAATATGAAATGTATTTTTAAAAACTTTAAAAACCACTCCGGAAAAGCAATAA 

4981 + + + + + + 5040 

AAATCAAAACAACGTCACAATTCAAATTCAAAAGTTATTCATCCGATTTGTTTATTTTTG 

5041 + + + + + + 5100 

CAAAATTTGAAAAAATCATGAAGGATTTAGAAAAGTTTTATAACATTTTTTCTAGATTTT 

5101 + + + + + + 5160 

TCAAAATTTTTTTTAACAAATCGAGAAAAAGAGAATGAAAAATCGATTTTAAAAATATCC 
5161 + + + + + + 5220 

Repeat 3 

< — " "" ' 

ACAGCTTCGAGAGTTTGAAATTACAGTACTCCTTAAAGGCGCACACCCCATTTGCATTGG 

5221 + + + + + + 5280 



ACCAAAAATTTGTCGTGTCGAGACCAGGTACCGTAGTTTTTGTCGCAAAAATTGCACCAT 

5281 + + + + + + 5340 

TGGACAATAAACCTTCCTAATCACCAAAAAGTAAAATTGAAATCTTCGAAAAGCCAAAAA 

5341 + + + + + + 5400 

ATTCAAAAAAAAAGTCGAATTTCGATTTTTTTTTTGGTTTTTTGGTCCCAAAAACCAAAA 

5401 + + + + + + 5460 

AAATCAATTTTCTGCAAAATACCAAAAAGAAACCCGAAAAAATTTCCCAGCCTTGTTCCT 

5461 + + + + + + 5520 

I 

AATGTAAACTGATATTTAATTTCCAGGGAATGCTCCTGACAATTCGAGACTTTGCCAAAC 

5521 + + + + + + 5580 

GMLLTIRDFAKH 
290 300 

ACGAATCACACGGAGATTCTGCGATACTCGTGATTCTATCACACGGAGAAGAGAATGTGA 

5581 - -- + + + + + + 5640 

ESHGDSAILVILSHGEENVI 

310 , 320 

, • 

TTATTGGAGTTGATGATATACCGATTAGTACACACGAGATATATGAXCTTCTCAACGCGG 

5641 + + - + + + + 5700 

I GVDDIPIST vH-** E f K . Y B^h L N A A 

330 y ? . ; * 340 
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FIG. 4G 

A (n2433) 
| | Intron 5 

CAAATGCTCCCCGTCTGGCGAATAAGCCGAAAATCGTTTTTGTGCAGGCTTGTCGAGGCG 

5701 + + + -- + + + 5760 

NAPRLANKPKIVFVQACRGE 

350 360 

I 

GTTCGTTTTTTATTTTAATTTTAATATAAATATTTTAAATAAATTCATTTTCAGAACGTC 

5761 + + + + + + 5820 

R R 

GTGACAATGGATTCCCAGTCTTGGATTCTGTCGACGGAGTTCCTGCATTTCTTCGTCGTG 

5821 + + - --- + + + + 5880 

DNGFPVLDSVDGVPAFLRRG 

370 380 

T (nll65) 
I 

GATGGGACAATCGAGACGGGCCATTGTTCAATTTTCTTGGATGTGTGCGGCCGCAAGTTC 

5881 + + + + + + 5940 

WDNRDGPLFNFLGCVRPQVQ 

390 400 

| Intron 6 

AGGTTGCAATTTAATTTCTTGAATGAGAATATTCCTTCAAAAAATCTAAAATAGATTTTT 
5941 + + + + + --- -+ 6000 

ATTCCAGAAAGTCCCGATCGAAAAATTGCGATATAATTACGAAATTTGTGATAAAATGAC 
6001 + + + + + + 6060 

Repeat 4 

AAACCAATCAGCATCGTCGATCTCCGCCCACTTCATCGGATTGGTTTGAAAGTGGGCGGA 
6061 + -- -- + + + + + 6120 

> 

GTGAATTGCTGATTGGTCGCAGTTTTCAGTTTAGAGGGAATTTAAAAATCGCCTTTTCGA 
6121 + + + + + + 6180 

AAATTAAAAATTGATTTTTTCAATTTTTTCGAAAAATATTCCGATTATTTTATATTCTTT 
6181 + - + + + + + 6240 

A (n717) 
I 

GGAGCGAAAGCCCCGTCCTGTAAACATTTTTAAATGATAATTAATAAATTTTTGCAGCAA 
6241 - + + + - + --- + -_ -+ 6300 

.yV Q 

T (nl949) O v v V * 

GTGTGGAGAAAGAAGCCGAGCCAAGCTGACATTCTGATTCGATAC^CAACGACAGCTCAA 

6301 + + + -;-- + ---;-;- + -+ 6360 

VWRKKP S Q A D I L I R ' A T T A Q 

410 ; r'; ; -' 420 
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FIG. 4H 

A (xil286) 
I 

TATGTTTCGTGGAGAAACAGTGCTCGTGGATCATGGTTCATTCAAGCCGTCTGTGAAGTG 

6361 + + -- + + -- + + 6420 

YVSWRNSARGSWFIQAVCEV 
430 440 

T (111129, nll64) 
I 

TTCTCGACACACGCAAAGGATATGGATGTTGTTGAGCTGCTGACTGAAGTCAATAAGAAG 

6421 + + + + + + 6480 

FSTHAKDMDVVELLTEVNKK 
450 460 

T (n2430) A (n2426) 

I | | Intron 7 

GTCGCTTGTGGATTTCAGACATCACAGGGATCGAATATTTTGAAACAGATGCCAGAGGTA 

6481 + + + + + + 6540 

VACGFQTSQGSNILKQMPE 
470 480 

Repeat 5 

CTTGAAACAAACAATGCATGTCTAACTTTTAAGGACACAGAAAAATAGGCAGAGGCTCCT 
6541 + + + + + + 6600 

> 

TTTGCAAGCCTGCCGCGCGTCAACCTAGAATTTTAGTTTTTAGCTAAAATGATTGATTTT 
6601 + + + + -- + + 6660 

GAATATTTTATGCTAATTTTTTTGCGTTAAATTTTGAAATAGTCACTATTTATCGGGTTT 
6661 + + + + + + 6720 

CCAGTAAAAAATGTTTATTAGCCATTGGATTTTACTGAAAACGAAAATTTGTAGTTTTTC 
6721 + + + + + + 6780 

AACGAAATTTATCGATTTTTAAATGTAAAAAAAAATAGCGAAAATTACATCAACCATCAA 
6781 + + + + + - -+ 6840 

GCATTTAAGCCAAAATTGTTAACTCATTTAAAAATTAATTCAAAGTTGTCCACGAGTATT 
6841 + + -- + + + + 6900 

Repeat 5 

<— . 

ACACGGTTGGCGCGCGGCAAGTTTGCAAAACGACGCTCCGCCTCTTTTTCTGTGCGGCTT 
6901 + + + + + + 6960 

T (nll63) 

0> I | 

GAAAACAAGGGATCGGTTTAGATTTTTCCCCAAAATTTAAATTAAATTTCAGATGACATC 

6961 + + + -?- + - + + 7020 

; \ /'•>' M T S 

* ' \ . t 

CCGCCTGCTCAAAAAGTTCTACTTTTGGCCGGAAGCACGAAACTCTGCCGTCTAAAATTC 

7021 + + + + + + 7080 

RLLKKFYFWP EARNSAV* 
490 500 
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FIG. 41 

ACTCGTGATTCATTGCCCAATTGATAATTGTCTGTATCTTCTCCCCCAGTTCTCTTTCGC 

7081 + + + + + + 7140 

CCAATTAGTTTAAAACCATGTGTATATTGTTATCCTATACTCATTTCACTTTATCATTCT 

714! + + + + + + 7200 

ATCATTTCTCTTCCCATTTTCACACATTTCCATTTCTCTACGATAATCTAAAATTATGAC 

7201 + + + + + + 7260 

GTTTGTGTCTCGAACGCATAATAATTTTAATAACTCGTTTTGAATTTGATTAGTTGTTGT 

7261 + + + + - --- + + 7 320 

GCCCAGTATATATGTATGTACTATGCTTCTATCAACAAAATAGTTTCATAGATCATCACC 
7321 + + + -- -- + - --- + + 7380 

CCAACCCCACCAACCTACCGTACCATATTCATTTTTGCCGGGAATCAATTTCGATTAATT 
7381 + + + + + + 7440 

TTAACCTATTTTTTCGCCACAAAAAATCTAATATTTGAATTAACGAATAGCATTCCCATC 
7441 + + + + + + 7500 

TCTCCCGTGCCGGAATGCCTCCCGGCCTTTTAAAGTTCGGAACATTTGGCAATTATGTAT 
7501 + + + + + + 7 560 

AAATTTGTAGGTCCCCCCCATCATTTCCCGCCCATCATCTCAAATTGCATTCTTTTTTCG 
7561 + + --- - + + + + 7620 

CCGTGATATCCCGATTCTGGTCAGCAAAGATCT 
7621 + + + --- 7653 
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FIG. 7 

Lines 

1 01 MMRQDRRS LLERNIMMFSSHLKVDE I LEVL I AKQVLNSDNGDMINS CGTV 50 

2 W_ LE. . .K.QA.L. .D V. . . .R.E 

3 TVS - SLI . . R M 

1 51 REKRREIVKAVQRPGDVAFDAFYDALRSTGHEGLAEVLEPLARSVDSNAV 100 

2 .DNEK R..E D. . .ND. .D. .M. . S .P .P. 

3 

1 101 EFECPMSPASHRRSRALSPAGYTSPTRVHRDSVSSVSSFTS_YQDIYSRA 149 

2 PM S P .A I T. . .V. . . . 

3 S 

1 150 RSRSR_SRALHSSDRHNYSSPPVNAFPSQPSSANSSFTGCSSLGYSSSRN 198 

2 ..S..S..P.Q M. AA_TS A 

3 T... ..P..T V . . S_ . S • Q . . . A S T 

1 199 RSFSKASGPTQYIFHEEDMNFVDAPTISRVFDEKTMYRNFSSPRGMCLI 247 

2 T.AQS Y H L... 

3 . .Y AHS Y H T. . .L. . . 

1 24 8 INNEHFEQMPTRNGTKADKDNLTNLFRCMGYTVICKDNLTGRGMLLTIRD 2 97 

2 I E..S-..S 

3 P IS I.H M 

1 298 FAKHESHGDSAILVI LSHGEENVI IGVDDIP I STHEI YDLLNAANAPRLA 347 

2 . GRNDM VSVNV 

3 ...N.T VSVNV X 

1 348 NKPKIVFVQACRGERRDNGFPVLDSVDGVPAFLRRGWDNRDGPLFNFLGC 3 97 

2 L SLI 

3 L V LI KG 

1 39 8 VRPQVQQVWRKKPSQADILIRYATTAQYVSWRNSARGSWFIQAVCEVFST 447 

2 M..A L 

3 A A L 

1 448 HAKDMDWELLTEVNKKVACGFQTSQGSNILKQMPEMTSRLLKKFYFWPE 497 

2 L 

3 A L 

/.*:*! , if -"498 ARN SAV 503 

2 DRG • • ■ - . 

* r 3 D».RS»»» 



Line 1 c. elegans 
Line * 2^ > c. briggsae 
Line 3" c. vulgaris 
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